@inproceedings{liu1large,
  title={Large-Scale Hydrodynamic {B}rownian Simulations on Multicore and Manycore Architectures},
  author={Liu, Xing and Chow, Edmond},
 booktitle = {28th IEEE International Parallel \& Distributed Processing Symposium},
  year = 2014,
}

@article{harvey2009implementation,
  title={An implementation of the smooth particle mesh {E}wald method on {GPU} hardware},
  author={Harvey, MJ and De Fabritiis, G},
  journal={Journal of Chemical Theory and Computation},
  volume={5},
  number={9},
  pages={2371--2377},
  year={2009},
  publisher={ACS Publications}
}

@article{harris2007parallel,
  title={Parallel prefix sum (scan) with CUDA},
  author={Harris, Mark and Sengupta, Shubhabrata and Owens, John D},
  journal={GPU gems},
  volume={3},
  number={39},
  pages={851--876},
  year={2007}
}

@techreport{bell2008efficient,
  title={Efficient sparse matrix-vector multiplication on CUDA},
  author={Bell, Nathan and Garland, Michael},
  year={2008},
  institution={Nvidia Technical Report NVR-2008-004, Nvidia Corporation}
}

@article{ewald1921ewald,
  title={Ewald summation},
  author={Ewald, Paul Peter},
  journal={Ann. Phys},
  volume={369},
  pages={253},
  year={1921}
}

@misc{nvidia2014programming,
  title={{CUDA C Programming Guide}},
  author={NVIDIA},
  year={2014}
}

@misc{nvidia2012kepler,
  title={{NVIDIA Kepler GK110 Architecture Whitepaper}},
  author={NVIDIA},
  year={2012}
}

@article{essmann1995smooth,
  title={A smooth particle mesh {E}wald method},
  author={Essmann, Ulrich and Perera, Lalith and Berkowitz, Max L and Darden, Tom and Lee, Hsing and Pedersen, Lee G},
  journal={The Journal of Chemical Physics},
  volume={103},
  number={19},
  pages={8577--8593},
  year={1995},
  publisher={AIP Publishing}
}


@article{brown2012implementing,
  title={Implementing molecular dynamics on hybrid high performance computers--Particle--particle particle-mesh},
  author={Brown, W Michael and Kohlmeyer, Axel and Plimpton, Steven J and Tharrington, Arnold N},
  journal={Computer Physics Communications},
  volume={183},
  number={3},
  pages={449--459},
  year={2012},
  publisher={Elsevier}
}

@article{gotz2012routine,
  title={Routine microsecond molecular dynamics simulations with {AMBER} on {GPU}. 1. {Generalized Born}},
  author={G\"otz, Andreas W and Williamson, Mark J and Xu, Dong and Poole, Duncan and Le Grand, Scott and Walker, Ross C},
  journal={Journal of Chemical Theory and Computation},
  volume={8},
  number={5},
  pages={1542--1555},
  year={2012},
  publisher={ACS Publications}
}

@article{ware1998fast,
  title={Fast approximate {F}ourier transforms for irregularly spaced data},
  author={Ware, Antony F},
  journal={SIAM Review},
  volume={40},
  number={4},
  pages={838--856},
  year={1998},
  publisher={SIAM}
}

@article{dutt1993fast,
  title={Fast {F}ourier transforms for nonequispaced data},
  author={Dutt, Alok and Rokhlin, Vladimir},
  journal={SIAM Journal on Scientific Computing},
  volume={14},
  number={6},
  pages={1368--1393},
  year={1993},
  publisher={SIAM}
}

@article{schomberg1995gridding,
  title={The gridding method for image reconstruction by {F}ourier transformation},
  author={Schomberg, Hermann and Timmer, Jan},
  journal={IEEE Transactions on Medical Imaging}, 
  volume={14},
  number={3},
  pages={596--607},
  year={1995},
  publisher={IEEE}
}

@article{twieg1983k,
  title={The k-trajectory formulation of the {NMR} imaging process with
  applications in analysis and synthesis of imaging methods},
  author={Twieg, Donald B},
  journal={Medical Physics},
  volume={10},
  number={5},
  pages={610--621},
  year={1983},
  publisher={American Association of Physicists in Medicine}
}

@article{soumekh1987computer,
  title={Computer-Assisted Diffraction Tomography},
  author={Soumekh, M Kaveh M},
  journal={Image Recovery: Theory and Application},
  pages={369},
  year={1987},
  publisher={Elsevier}
}

@inproceedings{Choi:2010:MAS:1693453.1693471,
 author = {Choi, Jee W. and Singh, Amik and Vuduc, Richard W.},
 title = {Model-driven Autotuning of Sparse Matrix-vector Multiply on {GPU}},
 booktitle = {Proceedings of the 15th ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming},
 series = {PPoPP '10},
 year = {2010},
 isbn = {978-1-60558-877-3},
 location = {Bangalore, India},
 pages = {115--126},
 numpages = {12},
 acmid = {1693471},
 publisher = {ACM},
 address = {New York, NY, USA},
 keywords = {gpu, performance modeling, sparse matrix-vector multiplication},
} 

@inproceedings{Bell:2009:ISM:1654059.1654078,
 author = {Bell, Nathan and Garland, Michael},
 title = {Implementing Sparse Matrix-vector Multiplication on Throughput-oriented Processors},
 booktitle = {Proceedings of the Conference on High Performance Computing Networking, Storage and Analysis},
 series = {SC '09},
 year = {2009},
 isbn = {978-1-60558-744-8},
 location = {Portland, Oregon},
 pages = {18:1--18:11},
 articleno = {18},
 numpages = {11},
 acmid = {1654078},
 publisher = {ACM},
 address = {New York, NY, USA},
} 

@ARTICLE{darden,
  author = {Darden, T. and York, D. and Pedersen, L.},
  title = {{Particle mesh Ewald -- an $N \log(N)$ method for Ewald sums in large
        systems}},
  journal = {Journal of Chemical Physics},
  year = {1993},
  volume = {98},
  pages = {10089-10092},
  number = {12},
  owner = {edmond},
  timestamp = {2012.06.29}
}

@ARTICLE{darve-2005,
  author = {Saintillan, David and Darve, Eric and Shaqfeh, Eric S. G.},
  title = {{A smooth particle-mesh Ewald algorithm for Stokes suspension simulations: The sedimentation of fibers}},
  journal = {Physics of Fluids},
  year = {2005},
  volume = {17},
  pages = {033301},
  number = {3},
  publisher = {AIP},
}

@article{koza2014compressed,
  title={Compressed Multirow Storage Format for Sparse Matrices on Graphics Processing Units},
  author={Koza, Zbigniew and Matyka, Maciej and Szkoda, Sebastian and Miroslaw, Lukasz},
  journal={SIAM Journal on Scientific Computing},
  volume={36},
  number={2},
  pages={C219--C239},
  year={2014},
  publisher={SIAM}
}

@article{kreutzer2014unified,
  title={A Unified Sparse Matrix Data Format for Efficient General Sparse Matrix-Vector Multiplication on Modern Processors with Wide {SIMD} Units},
  author={Kreutzer, Moritz and Hager, Georg and Wellein, Gerhard and Fehske, Holger and Bishop, Alan R},
  journal={SIAM Journal on Scientific Computing},
  volume={36},
  number={5},
  pages={C401--C423}, 
  year={2014},
  publisher={SIAM}
}

@article{oberhuber2010new,
  title={{New row-grouped CSR format for storing the sparse matrices on GPU with implementation in CUDA}},
  author={Oberhuber, Tom{\'a}{\v{s}} and Suzuki, Atsushi and Vacata, Jan},
  journal={arXiv preprint arXiv:1012.2270},
  year={2010}
}



